{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import sys\n",
    "import pandas as pd \n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import missingno as msno\n",
    "import seaborn as sns\n",
    "import warnings\n",
    "warnings.filterwarnings('ignore')\n",
    "%matplotlib inline\n",
    "from scipy.stats import *\n",
    "import math\n",
    "\n",
    "from tools.config import CONFIG"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['/home/wuxiang/data-vol-1/comptetition/mycode/tools/../../dataset/csv_merged_dataset/A1_MERGE.csv',\n",
       " '/home/wuxiang/data-vol-1/comptetition/mycode/tools/../../dataset/csv_merged_dataset/A3_MERGE.csv',\n",
       " '/home/wuxiang/data-vol-1/comptetition/mycode/tools/../../dataset/csv_merged_dataset/B_MERGE.csv',\n",
       " '/home/wuxiang/data-vol-1/comptetition/mycode/tools/../../dataset/csv_merged_dataset/A2_MERGE.csv',\n",
       " '/home/wuxiang/data-vol-1/comptetition/mycode/tools/../../dataset/csv_merged_dataset/C_MERGE.csv',\n",
       " '/home/wuxiang/data-vol-1/comptetition/mycode/tools/../../dataset/csv_merged_dataset/A_MERGE.csv']"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "path = CONFIG().MERGED_DATASET_PATH\n",
    "targets = [os.path.join(path, i) for i in os.listdir(path)]\n",
    "targets"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "2    8371\n",
       "1    8371\n",
       "0    8371\n",
       "Name: date_sub, dtype: int64"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_csv(targets[1], nrows=None)\n",
    "features = CONFIG().YB_FEATURES['A']\n",
    "df['date_sub'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([1, 2, 3])"
      ]
     },
     "execution_count": 51,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "a = pd.DataFrame()\n",
    "b = pd.DataFrame(np.array([1,2,3]),columns=['s'])\n",
    "c = pd.concat([a,b],axis=1)\n",
    "d = np.array(c).reshape(-1)\n",
    "d"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
